@String { icml              = {International Conference on Machine Learning (ICML)} }
@String { colt              = {Conference on Learning Theory (COLT)} }
@String { nips              = {Neural Information Processing Systems (NIPS)} }
@String { ijrr              = {International Journal of Robotics Research} }
@String { isrr              = {International Symposium on Robotics Research (ISRR)} }
@String { icra              = {{IEEE} International Conference on Robotics and Automation (ICRA)} }
@String { iros              = {{IEEE} International Conference on Intelligent Robots and Systems (IROS)} }
@String { humanoids         = {{IEEE-RAS} International Conference on Humanoid Robotics (Humanoids)} }
@String { jmlr              = {Journal of Machine Learning Research} }
@String { iclr              = {International Conference on Learning Representations (ICLR)} }
@String { uai               = {Uncertainty in Artificial Intelligence (UAI)} }
@String { tpami             = {IEEE Transactions on Pattern Analysis \& Machine Intelligence} }
@String { tac               = {IEEE Transactions on Automatic Control} }
@String { automatica        = {Automatica} }
@String { jfr               = {Journal of Field Robotics} }
@String { ar                = {Autonomous Robots} }
@String { ijcai             = {International Joint Conference on Artificial Intelligence (IJCAI)} }
@String { aaai              = {AAAI Conference on Artificial Intelligence} }
@String { cvpr              = {{IEEE} Conference on Computer Vision and Pattern Recognition (CVPR)} }
@String { eccv              = {European Conference on Computer Vision (ECCV)} }
@String { aistats           = {Artificial Intelligence and Statistics (AISTATS)} }
@String { acc               = {American Control Conference (ACC)} }
@String { cdc               = {IEEE Conference on Decision and Control (CDC)} }
@String { nc                = {Neural Computation} }
@String { jasa              = {Journal of the American Statistical Association} }
@String { wafr              = {Workshop on the Algorithmic Foundations of Robotics (WAFR)} }
@String { corl              = {Conference on Robot Learning (CoRL)} }
@String { rss               = {Robotics: Science and Systems (RSS)} }
@String { jgcd              = {AIAA Journal of Guidance, Control, and Dynamics} }
@String { tsc               = {IEEE Transactions on Control Systems Technology} }


% planning

@book{lavalle2006planning,
  title={Planning algorithms},
  author={LaValle, Steven M},
  year={2006},
  publisher={Cambridge university press}
}

% adaptive control

@book{ioannou2012robust,
  title={Robust adaptive control},
  author={Ioannou, Petros A and Sun, Jing},
  year={2012},
  publisher={Courier Corporation}
}


% optimization 

@book{bertsekas2016nonlinear,
  title={Nonlinear programming},
  author={Bertsekas, Dimitri P},
  year={2016},
  publisher={Athena Scientific}
}

@book{bertsimas1997introduction,
  title={Introduction to linear optimization},
  author={Bertsimas, Dimitris and Tsitsiklis, John N},
  year={1997},
  publisher={Athena Scientific}
}

@article{powell2012ai,
  title={{AI}, {OR} and control theory: A rosetta stone for stochastic optimization},
  author={Powell, Warren B},
  year={2012}
}

@book{boyd2004convex,
  title={Convex optimization},
  author={Boyd, Stephen and Vandenberghe, Lieven},
  year={2004},
  publisher={Cambridge university press}
}

@article{kolter2008convex,
  title={Convex Optimization Overview},
  journal={CS 229 Lecture Notes},
  author={Zico Kolter},
  year={2008}
}

% DP

@book{altman1999constrained,
  title={Constrained Markov decision processes},
  author={Altman, Eitan},
  volume={7},
  year={1999},
  publisher={CRC Press}
}

@book{bertsekas1995dynamic,
  title={Dynamic programming and optimal control},
  author={Bertsekas, Dimitri P},
  edition={4},
  number={1},
  year={2012}
}

@book{anderson2007optimal,
  title={Optimal control: linear quadratic methods},
  author={Anderson, Brian DO and Moore, John B},
  year={2007},
  publisher={Courier Corporation}
}

@inproceedings{todorov2005generalized,
  title={A generalized iterative {LQG} method for locally-optimal feedback control of constrained nonlinear stochastic systems},
  author={Todorov, Emanuel and Li, Weiwei},
  booktitle=acc,
  year={2005}
}

@inproceedings{tassa2014control,
  title={Control-limited differential dynamic programming},
  author={Tassa, Yuval and Mansard, Nicolas and Todorov, Emo},
  booktitle=icra,
  year={2014}
}

@inproceedings{levine2014learning,
  title={Learning complex neural network policies with trajectory optimization},
  author={Levine, Sergey and Koltun, Vladlen},
  booktitle=icml,
  year={2014}
}

@book{mayne1970ddp,
  title={Differential Dynamic Programming},
  author={David Jacobson and David Mayne},
  year={1970},
  publisher={Elsevier}
}

@inproceedings{tassa2012synthesis,
  title={Synthesis and stabilization of complex behaviors through online trajectory optimization},
  author={Tassa, Yuval and Erez, Tom and Todorov, Emanuel},
  booktitle=iros,
  year={2012}
}

@techreport{liao1992advantages,
  title={Advantages of differential dynamic programming over Newton's method for discrete-time optimal control problems},
  author={Liao, Li-zhi and Shoemaker, Christine A},
  year={1992},
  institution={Cornell University}
}

@inproceedings{xie2017differential,
  title={Differential dynamic programming with nonlinear constraints},
  author={Xie, Zhaoming and Liu, C Karen and Hauser, Kris},
  booktitle=icra,
  year={2017}
}

@inproceedings{giftthaler2017projection,
  title={A projection approach to equality constrained iterative linear quadratic optimal control},
  author={Giftthaler, Markus and Buchli, Jonas},
  booktitle=humanoids,
  year={2017}
}

@inproceedings{li2004iterative,
  title={Iterative linear quadratic regulator design for nonlinear biological movement systems.},
  author={Li, Weiwei and Todorov, Emanuel},
  booktitle={International Conference on Informatics in Control, Automation, and Robotics},
  year={2004}
}

%HJB

@article{mitchell2005time,
  title={A time-dependent Hamilton-Jacobi formulation of reachable sets for continuous dynamic games},
  author={Mitchell, Ian M and Bayen, Alexandre M and Tomlin, Claire J},
  journal=tac,
  year={2005}
}

@article{bressan2010noncooperative,
  title={Noncooperative differential games. a tutorial},
  year={2010},
  author={Bressan, Alberto}
}

@book{kirk2012optimal,
  title={Optimal control theory: an introduction},
  author={Kirk, Donald E},
  year={2012},
  publisher={Courier Corporation}
}

% Indirect

@book{bryson1975applied,
  title={Applied Optimal Control: Optimization, Estimation and Control},
  author={Arthur Bryson and Yu-Chi Ho},
  year={1975},
  publisher={CRC Press}
}

@article{lee1967foundations,
  title={Foundations of optimal control theory},
  author={Lee, Ernest Bruce and Markus, Lawrence},
  year={1967},
  publisher={Wiley}
}

% Direct

@article{kelly2017transcription,
  title={Transcription Methods for Trajectory Optimization: a beginners tutorial},
  author={Kelly, Matthew},
  journal={arXiv:1707.00284},
  year={2017}
}

@article{kelly2017introduction,
  title={An introduction to trajectory optimization: how to do your own direct collocation},
  author={Kelly, Matthew},
  journal={SIAM Review},
  year={2017}
}

% MPC

@book{borrelli2017predictive,
  title={Predictive control for linear and hybrid systems},
  author={Borrelli, Francesco and Bemporad, Alberto and Morari, Manfred},
  year={2017},
  publisher={Cambridge University Press}
}

@book{rawlings2017model,
  title={Model Predictive Control: Theory, Computation, and Design},
  author={Rawlings, James Blake and Mayne, David Q and Diehl, Moritz},
  year={2017},
  publisher={Nob Hill Publishing}
}

% Adaptive Optimal Control

@article{ljung1999system,
  title={System identification},
  author={Ljung, Lennart},
  journal={Wiley Encyclopedia of Electrical and Electronics Engineering},
  year={1999}
}

@book{aastrom2013adaptive,
  title={Adaptive control},
  author={{\AA}str{\"o}m, Karl J and Wittenmark, Bj{\"o}rn},
  year={2013},
  publisher={Courier Corporation}
}

@article{simon1956dynamic,
  title={Dynamic programming under uncertainty with a quadratic criterion function},
  author={Simon, Herbert A},
  journal={Econometrica},
  year={1956}
}

@article{becker1985adaptive,
  title={Adaptive control with the stochastic approximation algorithm: Geometry and convergence},
  author={Becker, Arthur and Kumar, P and Wei, Ching-Zong},
  journal=tac,
  year={1985}
}

@article{abbasi2011regret,
  title={Regret bounds for the adaptive control of linear quadratic systems},
  author={Abbasi-Yadkori, Yasin and Szepesv{\'a}ri, Csaba},
  journal=colt,
  year={2011}
}

@article{moldovan2015optimism,
  title={Optimism-driven exploration for nonlinear systems},
  author={Moldovan, Teodor Mihai and Levine, Sergey and Jordan, Michael I and Abbeel, Pieter},
  journal=icra,
  year={2015}
}

@article{osband2016generalization,
  title={Generalization and Exploration via Randomized Value Functions},
  author={Osband, Ian and Van Roy, Benjamin and Wen, Zheng},
  journal=icml,
  year={2016}
}

@book{zhou1996robust,
  title={Robust and optimal control},
  author={Zhou, Kemin and Doyle, John Comstock and Glover, Keith and others},
  year={1996},
  publisher={Prentice Hall}
}

% regression 

@book{friedman2008elements,
  title={The elements of statistical learning},
  author={Friedman, Jerome and Hastie, Trevor and Tibshirani, Robert},
  year={2008},
  volume={2}
}

@book{murphy2012machine,
  title={Machine learning: a probabilistic perspective},
  author={Murphy, Kevin P},
  year={2012},
  publisher={MIT press}
}

@inproceedings{rasmussen2003gaussian,
  title={Gaussian processes in machine learning},
  author={Rasmussen, Carl Edward},
  year={2003},
  organization={Springer}
}

@article{petersenmatrix,
  title={The Matrix Cookbook},
  author={Petersen, Kaare Brandt and Pedersen, Michael Syskind}
}

@inproceedings{krizhevsky2012imagenet,
  title={Imagenet classification with deep convolutional neural networks},
  author={Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E},
  booktitle=nips,
  year={2012}
}

@book{goodfellow2016deep,
  title={Deep learning},
  author={Goodfellow, Ian and Bengio, Yoshua and Courville, Aaron},
  year={2016},
  publisher={MIT press}
}

@book{sutton2018reinforcement,
  title={Reinforcement learning: An introduction},
  author={Sutton, Richard S and Barto, Andrew G},
  year={2018},
  publisher={MIT press}
}


% model-free

@article{mnih2015human,
  title={Human-level control through deep reinforcement learning},
  author={Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Rusu, Andrei A and Veness, Joel and Bellemare, Marc G and Graves, Alex and Riedmiller, Martin and Fidjeland, Andreas K and Ostrovski, Georg and others},
  journal={Nature},
  year={2015}
}

@inproceedings{riedmiller2005neural,
  title={Neural fitted Q iteration--first experiences with a data efficient neural reinforcement learning method},
  author={Riedmiller, Martin},
  booktitle={European Conference on Machine Learning},
  year={2005}
}

@inproceedings{van2016deep,
  title={Deep reinforcement learning with double q-learning},
  author={Van Hasselt, Hado and Guez, Arthur and Silver, David},
  booktitle=aaai,
  year={2016}
}

@techreport{lin1993reinforcement,
  title={Reinforcement learning for robots using neural networks},
  author={Lin, Long-Ji},
  year={1993},
  institution={Carnegie-Mellon University}
}